Qiying's workspace
Runs
11
Name
11 visualized
State
Notes
User
Tags
Created
Runtime
Sweep
actor_rollout_ref.actor.clip_ratio
actor_rollout_ref.actor.clip_ratio2
actor_rollout_ref.actor.clip_ratio_high
actor_rollout_ref.actor.clip_ratio_low
actor_rollout_ref.actor.entropy_coeff
actor_rollout_ref.actor.fsdp_config.fsdp_size
actor_rollout_ref.actor.fsdp_config.optimizer_offload
actor_rollout_ref.actor.fsdp_config.param_offload
actor_rollout_ref.actor.fsdp_config.wrap_policy.min_num_params
actor_rollout_ref.actor.grad_clip
actor_rollout_ref.actor.kl_loss_coef
actor_rollout_ref.actor.kl_loss_type
actor_rollout_ref.actor.lm_loss_weight
actor_rollout_ref.actor.optim.lr
actor_rollout_ref.actor.optim.lr_warmup_steps
actor_rollout_ref.actor.optim.lr_warmup_steps_ratio
actor_rollout_ref.actor.optim.total_training_steps
actor_rollout_ref.actor.optim.warmup_style
actor_rollout_ref.actor.optim.weight_decay
actor_rollout_ref.actor.ppo_epochs
actor_rollout_ref.actor.ppo_max_token_len_per_gpu
actor_rollout_ref.actor.ppo_mini_batch_size
actor_rollout_ref.actor.shuffle
actor_rollout_ref.actor.strategy
actor_rollout_ref.actor.ulysses_sequence_parallel_size
actor_rollout_ref.actor.use_dynamic_bsz
actor_rollout_ref.actor.use_kl_loss
actor_rollout_ref.hybrid_engine
actor_rollout_ref.model.enable_gradient_checkpointing
actor_rollout_ref.model.override_config.attention_dropout
actor_rollout_ref.model.override_config.embd_pdrop
actor_rollout_ref.model.override_config.resid_pdrop
actor_rollout_ref.model.path
actor_rollout_ref.model.tokenizer_path
actor_rollout_ref.model.use_remove_padding
actor_rollout_ref.ref.fsdp_config.param_offload
actor_rollout_ref.ref.fsdp_config.wrap_policy.min_num_params
actor_rollout_ref.ref.log_prob_max_token_len_per_gpu
actor_rollout_ref.ref.log_prob_use_dynamic_bsz
actor_rollout_ref.ref.ulysses_sequence_parallel_size
actor_rollout_ref.rollout.disable_log_stats
actor_rollout_ref.rollout.do_sample
actor_rollout_ref.rollout.dtype
actor_rollout_ref.rollout.enable_chunked_prefill
Finished
-
zhangchi-usc1992
12h 11m
-
0.2
-
0.28
0.2
0
32
true
true
0
1
0
low_var_kl
-
0.000001
10
0
200
constant
0.1
1
20480
32
false
fsdp
4
true
false
true
true
-
-
-
/mnt/hdfs/zhangchi.usc1992_ssd_hldy/public_exp/models/Qwen2.5-Math-7B_32k
-
true
true
0
30720
true
4
true
true
bfloat16
true
Finished
-
zhangchi-usc1992
2d 18h 17m 44s
-
0.2
-
0.28
0.2
0
32
true
true
0
1
0
low_var_kl
-
0.000001
10
0
300
constant
0.1
1
20480
32
false
fsdp
4
true
false
true
true
-
-
-
/mnt/hdfs/zhangchi.usc1992_ssd_hldy/public_exp/models/Qwen3-30B-A3B-Base
-
true
true
0
30720
true
4
true
true
bfloat16
true
Finished
-
tongyuxuan361
11d 9h 45m 56s
-
0.2
-
0.28
0.2
0
-1
true
true
0
1
0
low_var_kl
-
0.000001
10
0
874
constant
0.1
1
22528
32
false
fsdp
8
true
false
true
true
0
0
0
/mnt/hdfs/haruna/home/byte_data_seed/ssd_hldy/user/tongyx361/data/verl/models/Qwen2.5-32B
-
true
true
0
22528
true
8
true
true
bfloat16
true
Crashed
-
tongyuxuan361
21h 56m 27s
-
0.2
-
0.28
0.2
0
-1
true
true
0
1
0
low_var_kl
-
0.000001
10
0
3499
constant
0.1
1
22528
32
false
fsdp
8
true
false
true
true
0
0
0
/mnt/hdfs/haruna/home/byte_data_seed/ssd_hldy/user/tongyx361/data/verl/models/Qwen2.5-32B
-
true
true
0
22528
true
8
true
true
bfloat16
true
Crashed
-
tongyuxuan361
4d 13h 8m 31s
-
0.2
-
0.28
0.2
0
-1
true
true
0
1
0
low_var_kl
-
0.000001
10
0
3499
constant
0.1
1
22528
32
false
fsdp
8
true
false
true
true
0
0
0
/mnt/hdfs/haruna/home/byte_data_seed/ssd_hldy/user/tongyx361/data/verl/models/Qwen2.5-32B
-
true
true
0
22528
true
8
true
true
bfloat16
true
Crashed
-
tongyuxuan361
6d 21h 36m 16s
-
0.2
10
0.28
0.2
0
-1
true
true
0
1
0.0001
low_var_kl
0
0.000001
20
0
17495000
constant
0.1
1
11264
512
false
fsdp
8
true
false
true
true
0
0
0
/file_system/verl/models/Qwen2.5-32B
/file_system/verl/models/Qwen2.5-32B
true
true
0
11264
true
8
true
true
bfloat16
true
Crashed
-
tongyuxuan361
1d 5h 43m 21s
-
0.2
10
0.28
0.2
0
-1
true
true
0
1
0.0001
low_var_kl
0
0.000001
20
0
17495000
constant
0.1
1
11264
512
false
fsdp
8
true
false
true
true
0
0
0
/file_system/verl/models/Qwen2.5-32B
/file_system/verl/models/Qwen2.5-32B
true
true
0
11264
true
8
true
true
bfloat16
true
Finished
-
tongyuxuan361
3h 9m 57s
-
0.2
10
0.28
0.2
0
-1
true
true
0
1
0.0001
low_var_kl
0
0.000001
20
0
17495000
constant
0.1
1
25000
512
false
fsdp
8
true
false
true
true
0
0
0
/file_system/verl/models/Qwen2.5-32B
/file_system/verl/models/Qwen2.5-32B
true
true
0
25000
true
8
true
true
bfloat16
true
Finished
-
tongyuxuan361
1d 16h 16m 40s
-
0.2
10
0.28
0.2
0
-1
true
true
0
1
0.0001
low_var_kl
0
0.000001
20
0
17495000
constant
0.1
1
50000
512
false
fsdp
8
true
false
true
true
0
0
0
/file_system/verl/models/Qwen2.5-32B
/file_system/verl/models/Qwen2.5-32B
true
true
0
50000
true
8
true
true
bfloat16
true
Finished
-
tongyuxuan361
15h 15m 21s
-
0.2
10
0.28
0.2
0
-1
true
true
0
1
0.0001
low_var_kl
0
0.000001
20
0
17495000
constant
0.1
1
50000
512
false
fsdp
8
true
false
true
true
0
0
0
/file_system/verl/models/Qwen2.5-32B
/file_system/verl/models/Qwen2.5-32B
true
true
0
50000
true
8
true
true
bfloat16
true
Crashed
-
tongyuxuan361
14h 28m 41s
-
0.2
10
0.28
0.2
0
-1
true
true
0
1
0.0001
low_var_kl
0
0.000001
20
0
17495000
constant
0.1
1
50000
512
false
fsdp
8
true
false
true
true
0
0
0
/file_system/verl/models/Qwen2.5-32B
/file_system/verl/models/Qwen2.5-32B
true
true
0
50000
true
8
true
true
bfloat16
true
1-11
of 11